@inproceedings{Ziebart_2008_6055,
   author = "Brian D. Ziebart and Andrew Maas and J. Andrew (Drew) Bagnell and Anind Dey",
   title = "Maximum Entropy Inverse Reinforcement Learning",
   booktitle = "Proceeding of AAAI 2008",
   month = "July",
   year = "2008",
}
@inproceedings{bziebart2008navigate,
   author = {Brian D. Ziebart and Andrew Maas 
            and J. Andrew Bagnell and Anind K. Dey},
   title = {Navigate Like a Cabbie: Probabilistic Reasoning from 
           Observed Context-Aware Behavior},
   year = {2008},
   booktitle = {Proc. Ubicomp},
   pages = {322--331}
}
@INPROCEEDINGS{Ng00algorithmsfor,
    author = {Andrew Y. Ng and Stuart Russell},
    title = {Algorithms for Inverse Reinforcement Learning},
    booktitle = {in Proc. 17th International Conf. on Machine Learning},
    year = {2000},
    pages = {663--670},
    publisher = {Morgan Kaufmann}
}
@inproceedings{Abbeel:2004:ALV:1015330.1015430,
 author = {Abbeel, Pieter and Ng, Andrew Y.},
 title = {Apprenticeship Learning via Inverse Reinforcement Learning},
 booktitle = {Proceedings of the Twenty-first International Conference on Machine Learning},
 series = {ICML '04},
 year = {2004},
 isbn = {1-58113-838-5},
 location = {Banff, Alberta, Canada},
 pages = {1--},
 url = {http://doi.acm.org/10.1145/1015330.1015430},
 doi = {10.1145/1015330.1015430},
 acmid = {1015430},
 publisher = {ACM},
 address = {New York, NY, USA},
} 
@INPROCEEDINGS{Henry10learningto,
    author = {Peter Henry and Christian Vollmer and Brian Ferris and Dieter Fox},
    title = {Learning to navigate through crowded environments},
    booktitle = {In ICRA},
    year = {2010}
}
@inproceedings{Russell:1998:LAU:279943.279964,
 author = {Russell, Stuart},
 title = {Learning Agents for Uncertain Environments (Extended Abstract)},
 booktitle = {Proceedings of the Eleventh Annual Conference on Computational Learning Theory},
 series = {COLT' 98},
 year = {1998},
 isbn = {1-58113-057-0},
 location = {Madison, Wisconsin, USA},
 pages = {101--103},
 numpages = {3},
 url = {http://doi.acm.org/10.1145/279943.279964},
 doi = {10.1145/279943.279964},
 acmid = {279964},
 publisher = {ACM},
 address = {New York, NY, USA},
} 

@book{Sutton:1998:IRL:551283,
 author = {Sutton, Richard S. and Barto, Andrew G.},
 title = {Introduction to Reinforcement Learning},
 year = {1998},
 isbn = {0262193981},
 edition = {1st},
 publisher = {MIT Press},
 address = {Cambridge, MA, USA},
} 

@book{Bertsekas:1996:NP:560669,
 author = {Bertsekas, Dimitri P. and Tsitsiklis, John N.},
 title = {Neuro-Dynamic Programming},
 year = {1996},
 isbn = {1886529108},
 edition = {1st},
 publisher = {Athena Scientific},
} 
@INPROCEEDINGS{Ratliff06maximummargin,
    author = {Nathan D. Ratliff and J. Andrew Bagnell and Martin A. Zinkevich},
    title = {Maximum margin planning},
    booktitle = {In Proceedings of the 23rd International Conference on Machine Learning (ICML’06},
    year = {2006}
}
@INPROCEEDINGS{Ramachandran07bayesianinverse,
    author = {Deepak Ramachandran},
    title = {Bayesian inverse reinforcement learning},
    booktitle = {in 20th Int. Joint Conf. Artificial Intelligence},
    year = {2007}
}